# 1. 切换到 nccluser
su - nccluser

# 2. 进入 nccl-tests 目录（确保你已编译）
cd ~/nccl-tests

# 3. 设置环境变量
export NCCL_DEBUG=INFO
export NCCL_IB_DISABLE=0
export NCCL_IB_HCA=mlx5_0:1,mlx5_1:1,mlx5_2:1,mlx5_3:1
ulimit -l unlimited

# 4. 运行测试
mpirun -np 2 -H localhost:2 ./build/all_reduce_perf -b 8 -e 128M -f 2 -g 1